# -*- coding: utf-8 -*-
__author__ = 'chen'

import jieba

# word_list = jieba.cut("衣服质量太差了！！！！颜色根本不纯！！",cut_all=True)
jieba.load_userdict("./data/cu.txt")
# word_list = jieba.cut_for_search("衣服质量太差了！！！！颜色根本不纯！！")
# print("全模式: ","|".join(word_list))
# word_list = jieba.cut_for_search("高富帅白富美")
# print("全模式: ","|".join(word_list))

file = open("./data/stopwords.txt",encoding="utf-8")
words = []
for line in file.readlines():
    # strip()去除字符，默认空格
    words.append(line.strip("\n"))
print(words)

word_list = jieba.cut("我们大家的白富美",cut_all=True)

for word in word_list:
    if word not in words:
        print(word)






















